#-*- coding: utf-8 -*-

import urllib.request
import urllib.parse
import re
import urllib.request,urllib.parse,http.cookiejar


def getHtml(url):
    cj=http.cookiejar.CookieJar()
    opener=urllib.request.build_opener(urllib.request.HTTPCookieProcessor(cj))
    opener.addheaders=[('User-Agent','Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.101 Safari/537.36'),('Cookie','4564564564564564565646540')]

    urllib.request.install_opener(opener)
    
    html_bytes = urllib.request.urlopen( url ).read()
    html_string = html_bytes.decode( 'utf-8' )
    return html_string

#url = http://zst.aicai.com/ssq/openInfo/
#最终输出结果格式如：2015075期开奖号码：6,11,13,19,21,32, 蓝球：4
html = getHtml("http://zst.aicai.com/ssq/openInfo/")
#<table class="fzTab nbt"> </table>
print('\n\n\n\n\n-----------------------html-------------------------------------------------------\n')
print(html)
table = html[html.find('<table class="fzTab nbt">') : html.find('</table>')]
print('\n\n\n\n\n-------------------------table-----------------------------------------------------\n')
print(repr(table))
#<tr onmouseout="this.style.background=''" onmouseover="this.style.background='#fff7d8'">
#<tr \r\n\t\t                  onmouseout=
tmp = table.split('<tr \r\n\t\t                  onmouseout=')
print('\n\n\n\n\n---------------------------tmp---------------------------------------------------\n')
#print(tmp)
print(len(tmp))
print('\n\n')
#for i in tmp:
#	print(repr(i))
for i in range(len(tmp)):
	trs = tmp[i]
	tr = trs[: trs.find('</tr>')]
	print(tr)
	number = tr.split('<th   >')[1].split('</th>')[0]
	print(number + '期开奖号码：')
	redtmp = tr.split('<th  class="redColor sz12" >')
	reds = redtmp[1:len(redtmp)-1]#去掉第一个和最后一个没用的元素
	#print(reds)
	for redstr in reds:
    		print(redstr.split('</th>')[0] + ",")
	print('蓝球：')
	blue = tr.split('<th  class="blueColor sz12" >')[1].split('</th>')[0]
	print(blue)
